import sys

text_1 = sys.argv[1]  # train
text_2 = sys.argv[2]  # test

count = 0

refers = {}
with open(text_1, 'r', encoding='utf-8') as t1:
    for line in t1:
        parts = line.strip().split()
        idx = parts[0]
        refers[idx] = parts[1:]

with open(text_2, 'r', encoding='utf-8') as t2:
    for line in t2:
        parts = line.strip().split()
        idx = parts[0]
        if idx in refers:
            count+=1
            print('%s is repetitive.')

print('There are %d repetitive utterances between these two file.' % count)